"""配置文件"""
# 文本最大长度
MAX_LENGTH = 40
# 数据集缓冲区大小
BUFFER_SIZE = 20000
# 批处理大小
BATCH_SIZE = 64

# 数据保存路径
data_path = "../data/processed_en-ch.txt"

# 测试模型数据路径
test_data_path = "../data/test.txt"

test_checkpoint_path = "checkpoint/base_model/test"
# 模型保存路径
checkpoint_path = "checkpoint/base_model/en-ch"

checkpoint_path_02 = "checkpoint/base_model/en-ch"
# 输入数据词典路径
input_tokenizer_path = "../tokenizer/en"
# 目标数据词典路径
target_tokenizer_path = "../tokenizer/ch"


# 训练测试
epochs = 20


"""超参数"""
# 编码层数量
num_layers = 4
# 编码器和解码器隐藏维度(embedding_dim)
d_model = 256

# 全连接层隐藏维度
dff = 512

# 自注意力头数量
num_heads = 8

# 随机丢弃神经元的数量概率(防止过拟合)
dropout_rate = 0.1
